#ifndef CUFFTDX_FFT_28_FP32_INV_PTX_HPP
#define CUFFTDX_FFT_28_FP32_INV_PTX_HPP



template<> __forceinline__ __device__ void cufftdx_private_function<214, float, 1>(cufftdx::detail::complex<float> *rmem, unsigned smem){

asm volatile (R"({
.reg .f32 f<681>;
.reg .b64 rd<2>;
add.f32 f113, %66, %120;
add.f32 f114, %56, f113;
add.f32 f115, %77, %109;
add.f32 f116, f115, f114;
add.f32 f117, %88, %98;
add.f32 f118, f117, f116;
add.f32 f119, %68, %121;
add.f32 f120, %57, f119;
add.f32 f121, %79, %111;
add.f32 f122, f121, f120;
add.f32 f123, %89, %100;
add.f32 f124, f123, f122;
fma.rn.f32 f125, f113, 0f3F1F9D07, %56;
mul.f32 f126, f115, 0f3E63DC87;
sub.f32 f127, f125, f126;
mul.f32 f128, f117, 0f3F66A5E5;
sub.f32 f129, f127, f128;
sub.f32 f130, %68, %121;
mul.f32 f131, f130, 0f3F48261C;
sub.f32 f132, %79, %111;
fma.rn.f32 f133, f132, 0f3F7994E0, f131;
sub.f32 f134, %89, %100;
fma.rn.f32 f135, f134, 0f3EDE2602, f133;
sub.f32 f136, f129, f135;
add.f32 f137, f135, f129;
mul.f32 f138, f113, 0f3E63DC87;
sub.f32 f139, %56, f138;
mul.f32 f140, f115, 0f3F66A5E5;
sub.f32 f141, f139, f140;
fma.rn.f32 f142, f117, 0f3F1F9D07, f141;
mul.f32 f143, f130, 0f3F7994E0;
mul.f32 f144, f132, 0f3EDE2602;
sub.f32 f145, f143, f144;
mul.f32 f146, f134, 0f3F48261C;
sub.f32 f147, f145, f146;
sub.f32 f148, f142, f147;
add.f32 f149, f147, f142;
mul.f32 f150, f113, 0f3F66A5E5;
sub.f32 f151, %56, f150;
fma.rn.f32 f152, f115, 0f3F1F9D07, f151;
mul.f32 f153, f117, 0f3E63DC87;
sub.f32 f154, f152, f153;
mul.f32 f155, f130, 0f3EDE2602;
mul.f32 f156, f132, 0f3F48261C;
sub.f32 f157, f155, f156;
fma.rn.f32 f158, f134, 0f3F7994E0, f157;
sub.f32 f159, f154, f158;
add.f32 f160, f158, f154;
fma.rn.f32 f161, f119, 0f3F1F9D07, %57;
mul.f32 f162, f121, 0f3E63DC87;
sub.f32 f163, f161, f162;
mul.f32 f164, f123, 0f3F66A5E5;
sub.f32 f165, f163, f164;
sub.f32 f166, %66, %120;
mul.f32 f167, f166, 0f3F48261C;
sub.f32 f168, %77, %109;
fma.rn.f32 f169, f168, 0f3F7994E0, f167;
sub.f32 f170, %88, %98;
fma.rn.f32 f171, f170, 0f3EDE2602, f169;
add.f32 f172, f171, f165;
sub.f32 f173, f165, f171;
mul.f32 f174, f119, 0f3E63DC87;
sub.f32 f175, %57, f174;
mul.f32 f176, f121, 0f3F66A5E5;
sub.f32 f177, f175, f176;
fma.rn.f32 f178, f123, 0f3F1F9D07, f177;
mul.f32 f179, f166, 0f3F7994E0;
mul.f32 f180, f168, 0f3EDE2602;
sub.f32 f181, f179, f180;
mul.f32 f182, f170, 0f3F48261C;
sub.f32 f183, f181, f182;
add.f32 f184, f183, f178;
sub.f32 f185, f178, f183;
mul.f32 f186, f119, 0f3F66A5E5;
sub.f32 f187, %57, f186;
fma.rn.f32 f188, f121, 0f3F1F9D07, f187;
mul.f32 f189, f123, 0f3E63DC87;
sub.f32 f190, f188, f189;
mul.f32 f191, f166, 0f3EDE2602;
mul.f32 f192, f168, 0f3F48261C;
sub.f32 f193, f191, f192;
fma.rn.f32 f194, f170, 0f3F7994E0, f193;
add.f32 f195, f194, f190;
sub.f32 f196, f190, f194;
add.f32 f197, %72, %125;
add.f32 f198, %61, f197;
add.f32 f199, %82, %114;
add.f32 f200, f199, f198;
add.f32 f201, %93, %104;
add.f32 f202, f201, f200;
add.f32 f203, %73, %127;
add.f32 f204, %63, f203;
add.f32 f205, %84, %116;
add.f32 f206, f205, f204;
add.f32 f207, %95, %105;
add.f32 f208, f207, f206;
fma.rn.f32 f209, f197, 0f3F1F9D07, %61;
mul.f32 f210, f199, 0f3E63DC87;
sub.f32 f211, f209, f210;
mul.f32 f212, f201, 0f3F66A5E5;
sub.f32 f213, f211, f212;
sub.f32 f214, %73, %127;
mul.f32 f215, f214, 0f3F48261C;
sub.f32 f216, %84, %116;
fma.rn.f32 f217, f216, 0f3F7994E0, f215;
sub.f32 f218, %95, %105;
fma.rn.f32 f219, f218, 0f3EDE2602, f217;
sub.f32 f220, f213, f219;
add.f32 f221, f219, f213;
mul.f32 f222, f197, 0f3E63DC87;
sub.f32 f223, %61, f222;
mul.f32 f224, f199, 0f3F66A5E5;
sub.f32 f225, f223, f224;
fma.rn.f32 f226, f201, 0f3F1F9D07, f225;
mul.f32 f227, f214, 0f3F7994E0;
mul.f32 f228, f216, 0f3EDE2602;
sub.f32 f229, f227, f228;
mul.f32 f230, f218, 0f3F48261C;
sub.f32 f231, f229, f230;
sub.f32 f232, f226, f231;
add.f32 f233, f231, f226;
mul.f32 f234, f197, 0f3F66A5E5;
sub.f32 f235, %61, f234;
fma.rn.f32 f236, f199, 0f3F1F9D07, f235;
mul.f32 f237, f201, 0f3E63DC87;
sub.f32 f238, f236, f237;
mul.f32 f239, f214, 0f3EDE2602;
mul.f32 f240, f216, 0f3F48261C;
sub.f32 f241, f239, f240;
fma.rn.f32 f242, f218, 0f3F7994E0, f241;
sub.f32 f243, f238, f242;
add.f32 f244, f242, f238;
fma.rn.f32 f245, f203, 0f3F1F9D07, %63;
mul.f32 f246, f205, 0f3E63DC87;
sub.f32 f247, f245, f246;
mul.f32 f248, f207, 0f3F66A5E5;
sub.f32 f249, f247, f248;
sub.f32 f250, %72, %125;
mul.f32 f251, f250, 0f3F48261C;
sub.f32 f252, %82, %114;
fma.rn.f32 f253, f252, 0f3F7994E0, f251;
sub.f32 f254, %93, %104;
fma.rn.f32 f255, f254, 0f3EDE2602, f253;
add.f32 f256, f255, f249;
sub.f32 f257, f249, f255;
mul.f32 f258, f203, 0f3E63DC87;
sub.f32 f259, %63, f258;
mul.f32 f260, f205, 0f3F66A5E5;
sub.f32 f261, f259, f260;
fma.rn.f32 f262, f207, 0f3F1F9D07, f261;
mul.f32 f263, f250, 0f3F7994E0;
mul.f32 f264, f252, 0f3EDE2602;
sub.f32 f265, f263, f264;
mul.f32 f266, f254, 0f3F48261C;
sub.f32 f267, f265, f266;
add.f32 f268, f267, f262;
sub.f32 f269, f262, f267;
mul.f32 f270, f203, 0f3F66A5E5;
sub.f32 f271, %63, f270;
fma.rn.f32 f272, f205, 0f3F1F9D07, f271;
mul.f32 f273, f207, 0f3E63DC87;
sub.f32 f274, f272, f273;
mul.f32 f275, f250, 0f3EDE2602;
mul.f32 f276, f252, 0f3F48261C;
sub.f32 f277, f275, f276;
fma.rn.f32 f278, f254, 0f3F7994E0, f277;
add.f32 f279, f278, f274;
sub.f32 f280, f274, f278;
mul.f32 f281, f220, 0f3F66A5E5;
mul.f32 f282, f256, 0f3EDE2602;
sub.f32 f283, f281, f282;
mul.f32 f284, f256, 0f3F66A5E5;
fma.rn.f32 f285, f220, 0f3EDE2602, f284;
mul.f32 f286, f232, 0f3F1F9D07;
mul.f32 f287, f268, 0f3F48261C;
sub.f32 f288, f286, f287;
mul.f32 f289, f268, 0f3F1F9D07;
fma.rn.f32 f290, f232, 0f3F48261C, f289;
mul.f32 f291, f243, 0f3E63DC87;
mul.f32 f292, f279, 0f3F7994E0;
sub.f32 f293, f291, f292;
mul.f32 f294, f279, 0f3E63DC87;
fma.rn.f32 f295, f243, 0f3F7994E0, f294;
mul.f32 f296, f244, 0fBE63DC87;
mul.f32 f297, f280, 0f3F7994E0;
sub.f32 f298, f296, f297;
mul.f32 f299, f280, 0fBE63DC87;
fma.rn.f32 f300, f244, 0f3F7994E0, f299;
mul.f32 f301, f233, 0fBF1F9D07;
mul.f32 f302, f269, 0f3F48261C;
sub.f32 f303, f301, f302;
mul.f32 f304, f269, 0fBF1F9D07;
fma.rn.f32 f305, f233, 0f3F48261C, f304;
mul.f32 f306, f221, 0fBF66A5E5;
mul.f32 f307, f257, 0f3EDE2602;
sub.f32 f308, f306, f307;
mul.f32 f309, f257, 0fBF66A5E5;
fma.rn.f32 f310, f221, 0f3EDE2602, f309;
add.f32 f311, f118, f202;
add.f32 f312, f124, f208;
sub.f32 f313, f118, f202;
sub.f32 f314, f124, f208;
add.f32 f315, f136, f283;
add.f32 f316, f172, f285;
sub.f32 f317, f136, f283;
sub.f32 f318, f172, f285;
add.f32 f319, f148, f288;
add.f32 f320, f184, f290;
sub.f32 f321, f148, f288;
sub.f32 f322, f184, f290;
add.f32 f323, f159, f293;
add.f32 f324, f195, f295;
sub.f32 f325, f159, f293;
sub.f32 f326, f195, f295;
add.f32 f327, f160, f298;
add.f32 f328, f196, f300;
sub.f32 f329, f160, f298;
sub.f32 f330, f196, f300;
add.f32 f331, f149, f303;
add.f32 f332, f185, f305;
sub.f32 f333, f149, f303;
sub.f32 f334, f185, f305;
add.f32 f335, f137, f308;
add.f32 f336, f173, f310;
sub.f32 f337, f137, f308;
sub.f32 f338, f173, f310;
add.f32 f339, %69, %122;
add.f32 f340, %58, f339;
add.f32 f341, %80, %112;
add.f32 f342, f341, f340;
add.f32 f343, %90, %101;
add.f32 f344, f343, f342;
add.f32 f345, %71, %124;
add.f32 f346, %60, f345;
add.f32 f347, %81, %113;
add.f32 f348, f347, f346;
add.f32 f349, %92, %103;
add.f32 f350, f349, f348;
fma.rn.f32 f351, f339, 0f3F1F9D07, %58;
mul.f32 f352, f341, 0f3E63DC87;
sub.f32 f353, f351, f352;
mul.f32 f354, f343, 0f3F66A5E5;
sub.f32 f355, f353, f354;
sub.f32 f356, %71, %124;
mul.f32 f357, f356, 0f3F48261C;
sub.f32 f358, %81, %113;
fma.rn.f32 f359, f358, 0f3F7994E0, f357;
sub.f32 f360, %92, %103;
fma.rn.f32 f361, f360, 0f3EDE2602, f359;
sub.f32 f362, f355, f361;
add.f32 f363, f361, f355;
mul.f32 f364, f339, 0f3E63DC87;
sub.f32 f365, %58, f364;
mul.f32 f366, f341, 0f3F66A5E5;
sub.f32 f367, f365, f366;
fma.rn.f32 f368, f343, 0f3F1F9D07, f367;
mul.f32 f369, f356, 0f3F7994E0;
mul.f32 f370, f358, 0f3EDE2602;
sub.f32 f371, f369, f370;
mul.f32 f372, f360, 0f3F48261C;
sub.f32 f373, f371, f372;
sub.f32 f374, f368, f373;
add.f32 f375, f373, f368;
mul.f32 f376, f339, 0f3F66A5E5;
sub.f32 f377, %58, f376;
fma.rn.f32 f378, f341, 0f3F1F9D07, f377;
mul.f32 f379, f343, 0f3E63DC87;
sub.f32 f380, f378, f379;
mul.f32 f381, f356, 0f3EDE2602;
mul.f32 f382, f358, 0f3F48261C;
sub.f32 f383, f381, f382;
fma.rn.f32 f384, f360, 0f3F7994E0, f383;
sub.f32 f385, f380, f384;
add.f32 f386, f384, f380;
fma.rn.f32 f387, f345, 0f3F1F9D07, %60;
mul.f32 f388, f347, 0f3E63DC87;
sub.f32 f389, f387, f388;
mul.f32 f390, f349, 0f3F66A5E5;
sub.f32 f391, f389, f390;
sub.f32 f392, %69, %122;
mul.f32 f393, f392, 0f3F48261C;
sub.f32 f394, %80, %112;
fma.rn.f32 f395, f394, 0f3F7994E0, f393;
sub.f32 f396, %90, %101;
fma.rn.f32 f397, f396, 0f3EDE2602, f395;
add.f32 f398, f397, f391;
sub.f32 f399, f391, f397;
mul.f32 f400, f345, 0f3E63DC87;
sub.f32 f401, %60, f400;
mul.f32 f402, f347, 0f3F66A5E5;
sub.f32 f403, f401, f402;
fma.rn.f32 f404, f349, 0f3F1F9D07, f403;
mul.f32 f405, f392, 0f3F7994E0;
mul.f32 f406, f394, 0f3EDE2602;
sub.f32 f407, f405, f406;
mul.f32 f408, f396, 0f3F48261C;
sub.f32 f409, f407, f408;
add.f32 f410, f409, f404;
sub.f32 f411, f404, f409;
mul.f32 f412, f345, 0f3F66A5E5;
sub.f32 f413, %60, f412;
fma.rn.f32 f414, f347, 0f3F1F9D07, f413;
mul.f32 f415, f349, 0f3E63DC87;
sub.f32 f416, f414, f415;
mul.f32 f417, f392, 0f3EDE2602;
mul.f32 f418, f394, 0f3F48261C;
sub.f32 f419, f417, f418;
fma.rn.f32 f420, f396, 0f3F7994E0, f419;
add.f32 f421, f420, f416;
sub.f32 f422, f416, f420;
add.f32 f423, %74, %128;
add.f32 f424, %64, f423;
add.f32 f425, %85, %117;
add.f32 f426, f425, f424;
add.f32 f427, %96, %106;
add.f32 f428, f427, f426;
add.f32 f429, %76, %129;
add.f32 f430, %65, f429;
add.f32 f431, %87, %119;
add.f32 f432, f431, f430;
add.f32 f433, %97, %108;
add.f32 f434, f433, f432;
fma.rn.f32 f435, f423, 0f3F1F9D07, %64;
mul.f32 f436, f425, 0f3E63DC87;
sub.f32 f437, f435, f436;
mul.f32 f438, f427, 0f3F66A5E5;
sub.f32 f439, f437, f438;
sub.f32 f440, %76, %129;
mul.f32 f441, f440, 0f3F48261C;
sub.f32 f442, %87, %119;
fma.rn.f32 f443, f442, 0f3F7994E0, f441;
sub.f32 f444, %97, %108;
fma.rn.f32 f445, f444, 0f3EDE2602, f443;
sub.f32 f446, f439, f445;
add.f32 f447, f445, f439;
mul.f32 f448, f423, 0f3E63DC87;
sub.f32 f449, %64, f448;
mul.f32 f450, f425, 0f3F66A5E5;
sub.f32 f451, f449, f450;
fma.rn.f32 f452, f427, 0f3F1F9D07, f451;
mul.f32 f453, f440, 0f3F7994E0;
mul.f32 f454, f442, 0f3EDE2602;
sub.f32 f455, f453, f454;
mul.f32 f456, f444, 0f3F48261C;
sub.f32 f457, f455, f456;
sub.f32 f458, f452, f457;
add.f32 f459, f457, f452;
mul.f32 f460, f423, 0f3F66A5E5;
sub.f32 f461, %64, f460;
fma.rn.f32 f462, f425, 0f3F1F9D07, f461;
mul.f32 f463, f427, 0f3E63DC87;
sub.f32 f464, f462, f463;
mul.f32 f465, f440, 0f3EDE2602;
mul.f32 f466, f442, 0f3F48261C;
sub.f32 f467, f465, f466;
fma.rn.f32 f468, f444, 0f3F7994E0, f467;
sub.f32 f469, f464, f468;
add.f32 f470, f468, f464;
fma.rn.f32 f471, f429, 0f3F1F9D07, %65;
mul.f32 f472, f431, 0f3E63DC87;
sub.f32 f473, f471, f472;
mul.f32 f474, f433, 0f3F66A5E5;
sub.f32 f475, f473, f474;
sub.f32 f476, %74, %128;
mul.f32 f477, f476, 0f3F48261C;
sub.f32 f478, %85, %117;
fma.rn.f32 f479, f478, 0f3F7994E0, f477;
sub.f32 f480, %96, %106;
fma.rn.f32 f481, f480, 0f3EDE2602, f479;
add.f32 f482, f481, f475;
sub.f32 f483, f475, f481;
mul.f32 f484, f429, 0f3E63DC87;
sub.f32 f485, %65, f484;
mul.f32 f486, f431, 0f3F66A5E5;
sub.f32 f487, f485, f486;
fma.rn.f32 f488, f433, 0f3F1F9D07, f487;
mul.f32 f489, f476, 0f3F7994E0;
mul.f32 f490, f478, 0f3EDE2602;
sub.f32 f491, f489, f490;
mul.f32 f492, f480, 0f3F48261C;
sub.f32 f493, f491, f492;
add.f32 f494, f493, f488;
sub.f32 f495, f488, f493;
mul.f32 f496, f429, 0f3F66A5E5;
sub.f32 f497, %65, f496;
fma.rn.f32 f498, f431, 0f3F1F9D07, f497;
mul.f32 f499, f433, 0f3E63DC87;
sub.f32 f500, f498, f499;
mul.f32 f501, f476, 0f3EDE2602;
mul.f32 f502, f478, 0f3F48261C;
sub.f32 f503, f501, f502;
fma.rn.f32 f504, f480, 0f3F7994E0, f503;
add.f32 f505, f504, f500;
sub.f32 f506, f500, f504;
mul.f32 f507, f446, 0f3F66A5E5;
mul.f32 f508, f482, 0f3EDE2602;
sub.f32 f509, f507, f508;
mul.f32 f510, f482, 0f3F66A5E5;
fma.rn.f32 f511, f446, 0f3EDE2602, f510;
mul.f32 f512, f458, 0f3F1F9D07;
mul.f32 f513, f494, 0f3F48261C;
sub.f32 f514, f512, f513;
mul.f32 f515, f494, 0f3F1F9D07;
fma.rn.f32 f516, f458, 0f3F48261C, f515;
mul.f32 f517, f469, 0f3E63DC87;
mul.f32 f518, f505, 0f3F7994E0;
sub.f32 f519, f517, f518;
mul.f32 f520, f505, 0f3E63DC87;
fma.rn.f32 f521, f469, 0f3F7994E0, f520;
mul.f32 f522, f470, 0fBE63DC87;
mul.f32 f523, f506, 0f3F7994E0;
sub.f32 f524, f522, f523;
mul.f32 f525, f506, 0fBE63DC87;
fma.rn.f32 f526, f470, 0f3F7994E0, f525;
mul.f32 f527, f459, 0fBF1F9D07;
mul.f32 f528, f495, 0f3F48261C;
sub.f32 f529, f527, f528;
mul.f32 f530, f495, 0fBF1F9D07;
fma.rn.f32 f531, f459, 0f3F48261C, f530;
mul.f32 f532, f447, 0fBF66A5E5;
mul.f32 f533, f483, 0f3EDE2602;
sub.f32 f534, f532, f533;
mul.f32 f535, f483, 0fBF66A5E5;
fma.rn.f32 f536, f447, 0f3EDE2602, f535;
add.f32 f537, f344, f428;
add.f32 f538, f350, f434;
sub.f32 f539, f344, f428;
sub.f32 f540, f350, f434;
add.f32 f541, f362, f509;
add.f32 f542, f398, f511;
sub.f32 f543, f362, f509;
sub.f32 f544, f398, f511;
add.f32 f545, f374, f514;
add.f32 f546, f410, f516;
sub.f32 f547, f374, f514;
sub.f32 f548, f410, f516;
add.f32 f549, f385, f519;
add.f32 f550, f421, f521;
sub.f32 f551, f385, f519;
sub.f32 f552, f421, f521;
add.f32 f553, f386, f524;
add.f32 f554, f422, f526;
sub.f32 f555, f386, f524;
sub.f32 f556, f422, f526;
add.f32 f557, f375, f529;
add.f32 f558, f411, f531;
sub.f32 f559, f375, f529;
sub.f32 f560, f411, f531;
add.f32 f561, f363, f534;
add.f32 f562, f399, f536;
sub.f32 f563, f363, f534;
sub.f32 f564, f399, f536;
mul.f32 f565, f541, 0f3F7994E0;
mul.f32 f566, f542, 0f3E63DC87;
sub.f32 f567, f565, f566;
mul.f32 f568, f542, 0f3F7994E0;
fma.rn.f32 f569, f541, 0f3E63DC87, f568;
mul.f32 f570, f545, 0f3F66A5E5;
mul.f32 f571, f546, 0f3EDE2602;
sub.f32 f572, f570, f571;
mul.f32 f573, f546, 0f3F66A5E5;
fma.rn.f32 f574, f545, 0f3EDE2602, f573;
mul.f32 f575, f549, 0f3F48261C;
mul.f32 f576, f550, 0f3F1F9D07;
sub.f32 f577, f575, f576;
mul.f32 f578, f550, 0f3F48261C;
fma.rn.f32 f579, f549, 0f3F1F9D07, f578;
mul.f32 f580, f553, 0f3F1F9D07;
mul.f32 f581, f554, 0f3F48261C;
sub.f32 f582, f580, f581;
mul.f32 f583, f554, 0f3F1F9D07;
fma.rn.f32 f584, f553, 0f3F48261C, f583;
mul.f32 f585, f557, 0f3EDE2602;
mul.f32 f586, f558, 0f3F66A5E5;
sub.f32 f587, f585, f586;
mul.f32 f588, f558, 0f3EDE2602;
fma.rn.f32 f589, f557, 0f3F66A5E5, f588;
mul.f32 f590, f561, 0f3E63DC87;
mul.f32 f591, f562, 0f3F7994E0;
sub.f32 f592, f590, f591;
mul.f32 f593, f562, 0f3E63DC87;
fma.rn.f32 f594, f561, 0f3F7994E0, f593;
mul.f32 f595, f543, 0fBE63DC87;
mul.f32 f596, f544, 0f3F7994E0;
sub.f32 f597, f595, f596;
mul.f32 f598, f544, 0fBE63DC87;
fma.rn.f32 f599, f543, 0f3F7994E0, f598;
mul.f32 f600, f547, 0fBEDE2602;
mul.f32 f601, f548, 0f3F66A5E5;
sub.f32 f602, f600, f601;
mul.f32 f603, f548, 0fBEDE2602;
fma.rn.f32 f604, f547, 0f3F66A5E5, f603;
mul.f32 f605, f551, 0fBF1F9D07;
mul.f32 f606, f552, 0f3F48261C;
sub.f32 f607, f605, f606;
mul.f32 f608, f552, 0fBF1F9D07;
fma.rn.f32 f609, f551, 0f3F48261C, f608;
mul.f32 f610, f555, 0fBF48261C;
mul.f32 f611, f556, 0f3F1F9D07;
sub.f32 f612, f610, f611;
mul.f32 f613, f556, 0fBF48261C;
fma.rn.f32 f614, f555, 0f3F1F9D07, f613;
mul.f32 f615, f559, 0fBF66A5E5;
mul.f32 f616, f560, 0f3EDE2602;
sub.f32 f617, f615, f616;
mul.f32 f618, f560, 0fBF66A5E5;
fma.rn.f32 f619, f559, 0f3EDE2602, f618;
mul.f32 f620, f563, 0fBF7994E0;
mul.f32 f621, f564, 0f3E63DC87;
sub.f32 f622, f620, f621;
mul.f32 f623, f564, 0fBF7994E0;
fma.rn.f32 f624, f563, 0f3E63DC87, f623;
add.f32 %1, f312, f538;
add.f32 %0, f311, f537;
add.f32 %3, f316, f569;
add.f32 %2, f315, f567;
add.f32 %5, f320, f574;
add.f32 %4, f319, f572;
add.f32 %7, f324, f579;
add.f32 %6, f323, f577;
add.f32 %9, f328, f584;
add.f32 %8, f327, f582;
add.f32 %11, f332, f589;
add.f32 %10, f331, f587;
add.f32 %13, f336, f594;
add.f32 %12, f335, f592;
add.f32 %15, f314, f539;
sub.f32 %14, f313, f540;
add.f32 %17, f318, f599;
add.f32 %16, f317, f597;
add.f32 %19, f322, f604;
add.f32 %18, f321, f602;
add.f32 %21, f326, f609;
add.f32 %20, f325, f607;
add.f32 %23, f330, f614;
add.f32 %22, f329, f612;
add.f32 %25, f334, f619;
add.f32 %24, f333, f617;
add.f32 %27, f338, f624;
add.f32 %26, f337, f622;
sub.f32 %29, f312, f538;
sub.f32 %28, f311, f537;
sub.f32 %31, f316, f569;
sub.f32 %30, f315, f567;
sub.f32 %33, f320, f574;
sub.f32 %32, f319, f572;
sub.f32 %35, f324, f579;
sub.f32 %34, f323, f577;
sub.f32 %37, f328, f584;
sub.f32 %36, f327, f582;
sub.f32 %39, f332, f589;
sub.f32 %38, f331, f587;
sub.f32 %41, f336, f594;
sub.f32 %40, f335, f592;
sub.f32 %43, f314, f539;
add.f32 %42, f313, f540;
sub.f32 %45, f318, f599;
sub.f32 %44, f317, f597;
sub.f32 %47, f322, f604;
sub.f32 %46, f321, f602;
sub.f32 %49, f326, f609;
sub.f32 %48, f325, f607;
sub.f32 %51, f330, f614;
sub.f32 %50, f329, f612;
sub.f32 %53, f334, f619;
sub.f32 %52, f333, f617;
sub.f32 %55, f338, f624;
sub.f32 %54, f337, f622;
})"
     : "=f"(rmem[0].x), "=f"(rmem[0].y), "=f"(rmem[1].x), "=f"(rmem[1].y), "=f"(rmem[2].x), "=f"(rmem[2].y), "=f"(rmem[3].x), "=f"(rmem[3].y), "=f"(rmem[4].x), "=f"(rmem[4].y), "=f"(rmem[5].x), "=f"(rmem[5].y), "=f"(rmem[6].x), "=f"(rmem[6].y), "=f"(rmem[7].x), "=f"(rmem[7].y), "=f"(rmem[8].x), "=f"(rmem[8].y), "=f"(rmem[9].x), "=f"(rmem[9].y), "=f"(rmem[10].x), "=f"(rmem[10].y), "=f"(rmem[11].x), "=f"(rmem[11].y), "=f"(rmem[12].x), "=f"(rmem[12].y), "=f"(rmem[13].x), "=f"(rmem[13].y), "=f"(rmem[14].x), "=f"(rmem[14].y), "=f"(rmem[15].x), "=f"(rmem[15].y), "=f"(rmem[16].x), "=f"(rmem[16].y), "=f"(rmem[17].x), "=f"(rmem[17].y), "=f"(rmem[18].x), "=f"(rmem[18].y), "=f"(rmem[19].x), "=f"(rmem[19].y), "=f"(rmem[20].x), "=f"(rmem[20].y), "=f"(rmem[21].x), "=f"(rmem[21].y), "=f"(rmem[22].x), "=f"(rmem[22].y), "=f"(rmem[23].x), "=f"(rmem[23].y), "=f"(rmem[24].x), "=f"(rmem[24].y), "=f"(rmem[25].x), "=f"(rmem[25].y), "=f"(rmem[26].x), "=f"(rmem[26].y), "=f"(rmem[27].x), "=f"(rmem[27].y): "f"(rmem[0].x), "f"(rmem[0].y), "f"(rmem[1].x), "f"(rmem[1].y), "f"(rmem[1].y), "f"(rmem[2].x), "f"(rmem[2].y), "f"(rmem[2].y), "f"(rmem[3].x), "f"(rmem[3].y), "f"(rmem[4].x), "f"(rmem[4].y), "f"(rmem[4].y), "f"(rmem[5].x), "f"(rmem[5].y), "f"(rmem[5].y), "f"(rmem[6].x), "f"(rmem[6].y), "f"(rmem[7].x), "f"(rmem[7].y), "f"(rmem[7].y), "f"(rmem[8].x), "f"(rmem[8].y), "f"(rmem[8].y), "f"(rmem[9].x), "f"(rmem[9].y), "f"(rmem[10].x), "f"(rmem[10].y), "f"(rmem[10].y), "f"(rmem[11].x), "f"(rmem[11].y), "f"(rmem[11].y), "f"(rmem[12].x), "f"(rmem[12].y), "f"(rmem[13].x), "f"(rmem[13].y), "f"(rmem[13].y), "f"(rmem[14].x), "f"(rmem[14].y), "f"(rmem[14].y), "f"(rmem[15].x), "f"(rmem[15].y), "f"(rmem[16].x), "f"(rmem[16].y), "f"(rmem[16].y), "f"(rmem[17].x), "f"(rmem[17].y), "f"(rmem[17].y), "f"(rmem[18].x), "f"(rmem[18].y), "f"(rmem[19].x), "f"(rmem[19].y), "f"(rmem[19].y), "f"(rmem[20].x), "f"(rmem[20].y), "f"(rmem[20].y), "f"(rmem[21].x), "f"(rmem[21].y), "f"(rmem[22].x), "f"(rmem[22].y), "f"(rmem[22].y), "f"(rmem[23].x), "f"(rmem[23].y), "f"(rmem[23].y), "f"(rmem[24].x), "f"(rmem[24].y), "f"(rmem[25].x), "f"(rmem[25].y), "f"(rmem[25].y), "f"(rmem[26].x), "f"(rmem[26].y), "f"(rmem[26].y), "f"(rmem[27].x), "f"(rmem[27].y));
};


#endif
